@inproceedings{krizhevsky2012imagenet,
  title={Imagenet classification with deep convolutional neural networks},
  author={Krizhevsky, Alex and Sutskever, Ilya and Hinton, Geoffrey E},
  booktitle={Advances in neural information processing systems},
  pages={1097--1105},
  year={2012}
}
@article{simonyan2014very,
  title={Very deep convolutional networks for large-scale image recognition},
  author={Simonyan, Karen and Zisserman, Andrew},
  journal={arXiv preprint arXiv:1409.1556},
  year={2014}
}
@inproceedings{he2016deep,
  title={Deep residual learning for image recognition},
  author={He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
  booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
  pages={770--778},
  year={2016}
}
@inproceedings{kendall2017uncertainties,
  title={What uncertainties do we need in bayesian deep learning for computer vision?},
  author={Kendall, Alex and Gal, Yarin},
  booktitle={Advances in neural information processing systems},
  pages={5574--5584},
  year={2017}
}
@article{kwon2018uncertainty,
  title={Uncertainty quantification using Bayesian neural networks in classification: Application to ischemic stroke lesion segmentation},
  author={Kwon, Yongchan and Won, Joong-Ho and Kim, Beom Joon and Paik, Myunghee Cho},
  year={2018}
}
@article{buntine1991bayesian,
  title={Bayesian back-propagation},
  author={Buntine, Wray L and Weigend, Andreas S},
  journal={Complex systems},
  volume={5},
  number={6},
  pages={603--643},
  year={1991}
}
@inproceedings{hinton1993keeping,
  title={Keeping the neural networks simple by minimizing the description length of the weights},
  author={Hinton, Geoffrey E and Van Camp, Drew},
  booktitle={Proceedings of the sixth annual conference on Computational learning theory},
  pages={5--13},
  year={1993},
  organization={ACM}
}
@inproceedings{hochreiter1995simplifying,
  title={Simplifying neural nets by discovering flat minima},
  author={Hochreiter, Sepp and Schmidhuber, J{\"u}rgen},
  booktitle={Advances in neural information processing systems},
  pages={529--536},
  year={1995}
}
@inproceedings{denker1991transforming,
  title={Transforming neural-net output levels to probability distributions},
  author={Denker, John S and LeCu, Yann},
  booktitle={Advances in neural information processing systems},
  pages={853--859},
  year={1991}
}
@article{mackay1995probable,
  title={Probable networks and plausible predictions—a review of practical Bayesian methods for supervised neural networks},
  author={MacKay, David JC},
  journal={Network: Computation in Neural Systems},
  volume={6},
  number={3},
  pages={469--505},
  year={1995},
  publisher={Taylor \& Francis}
}
@book{neal2012bayesian,
  title={Bayesian learning for neural networks},
  author={Neal, Radford M},
  volume={118},
  year={2012},
  publisher={Springer Science \& Business Media}
}
@article{graves2016stochastic,
  title={Stochastic backpropagation through mixture density distributions},
  author={Graves, Alex},
  journal={arXiv preprint arXiv:1607.05690},
  year={2016}
}
@article{srivastava2014dropout,
  title={Dropout: a simple way to prevent neural networks from overfitting},
  author={Srivastava, Nitish and Hinton, Geoffrey and Krizhevsky, Alex and Sutskever, Ilya and Salakhutdinov, Ruslan},
  journal={The Journal of Machine Learning Research},
  volume={15},
  number={1},
  pages={1929--1958},
  year={2014},
  publisher={JMLR. org}
}
@inproceedings{wang2013fast,
  title={Fast dropout training},
  author={Wang, Sida and Manning, Christopher},
  booktitle={international conference on machine learning},
  pages={118--126},
  year={2013}
}

@inproceedings{coates2011analysis,
  title={An analysis of single-layer networks in unsupervised feature learning},
  author={Coates, Adam and Ng, Andrew and Lee, Honglak},
  booktitle={Proceedings of the fourteenth international conference on artificial intelligence and statistics},
  pages={215--223},
  year={2011}
}

@article{blundell2015weight,
  title={Weight uncertainty in neural networks},
  author={Blundell, Charles and Cornebise, Julien and Kavukcuoglu, Koray and Wierstra, Daan},
  journal={arXiv preprint arXiv:1505.05424},
  year={2015}
}
@online{xiao2017/online,
  author       = {Han Xiao and Kashif Rasul and Roland Vollgraf},
  title        = {Fashion-MNIST: a Novel Image Dataset for Benchmarking Machine Learning Algorithms},
  date         = {2017-08-28},
  year         = {2017},
  eprintclass  = {cs.LG},
  eprinttype   = {arXiv},
  eprint       = {cs.LG/1708.07747},
}
@inproceedings{graves2011practical,
  title={Practical variational inference for neural networks},
  author={Graves, Alex},
  booktitle={Advances in Neural Information Processing Systems},
  pages={2348--2356},
  year={2011}
}
@article{fortunato2017bayesian,
  title={Bayesian recurrent neural networks},
  author={Fortunato, Meire and Blundell, Charles and Vinyals, Oriol},
  journal={arXiv preprint arXiv:1704.02798},
  year={2017}
}
@article{lecun1998gradient,
  title={Gradient-based learning applied to document recognition},
  author={LeCun, Yann and Bottou, Leon and Bengio, Yoshua and Haffner, Patrick},
  journal={Proceedings of the IEEE},
  volume={86},
  number={11},
  pages={2278--2324},
  year={1998},
  publisher={IEEE}
}
@incollection{neal1998view,
  title={A view of the EM algorithm that justifies incremental, sparse, and other variants},
  author={Neal, Radford M and Hinton, Geoffrey E},
  booktitle={Learning in graphical models},
  pages={355--368},
  year={1998},
  publisher={Springer}
}
@article{yedidia2005constructing,
  title={Constructing free-energy approximations and generalized belief propagation algorithms},
  author={Yedidia, Jonathan S and Freeman, William T and Weiss, Yair},
  journal={IEEE Transactions on information theory},
  volume={51},
  number={7},
  pages={2282--2312},
  year={2005},
  publisher={IEEE}
}
@article{friston2007variational,
  title={Variational free energy and the Laplace approximation},
  author={Friston, Karl and Mattout, J{\'e}r{\'e}mie and Trujillo-Barreto, Nelson and Ashburner, John and Penny, Will},
  journal={Neuroimage},
  volume={34},
  number={1},
  pages={220--234},
  year={2007},
  publisher={Elsevier}
}
@techreport{krizhevsky2009learning,
  title={Learning multiple layers of features from tiny images},
  author={Krizhevsky, Alex and Hinton, Geoffrey},
  year={2009},
  institution={Citeseer}
}
@inproceedings{kingma2015variational,
  title={Variational dropout and the local reparameterization trick},
  author={Kingma, Diederik P and Salimans, Tim and Welling, Max},
  booktitle={Advances in Neural Information Processing Systems},
  pages={2575--2583},
  year={2015}
}
@article{neklyudov2018variance,
  title={Variance Networks: When Expectation Does Not Meet Your Expectations},
  author={Neklyudov, Kirill and Molchanov, Dmitry and Ashukha, Arsenii and Vetrov, Dmitry},
  journal={arXiv preprint arXiv:1803.03764},
  year={2018}
}
@article{lipton2016efficient,
  title={Efficient exploration for dialogue policy learning with BBQ networks \& replay buffer spiking},
  author={Lipton, Zachary C and Gao, Jianfeng and Li, Lihong and Li, Xiujun and Ahmed, Faisal and Deng, Li},
  journal={arXiv preprint arXiv:1608.05081},
  year={2016}
}
@article{kullback1951information,
  title={On information and sufficiency},
  author={Kullback, Solomon and Leibler, Richard A},
  journal={The annals of mathematical statistics},
  volume={22},
  number={1},
  pages={79--86},
  year={1951},
  publisher={JSTOR}
}
@article{kingma2014adam,
  title={Adam: A method for stochastic optimization},
  author={Kingma, Diederik P and Ba, Jimmy},
  journal={arXiv preprint arXiv:1412.6980},
  year={2014}
}
@article{houthooft2016curiosity,
  title={Curiosity-driven exploration in deep reinforcement learning via bayesian neural networks},
  author={Houthooft, Rein and Chen, Xi and Duan, Yan and Schulman, John and De Turck, Filip and Abbeel, Pieter},
  journal={arXiv preprint arxiv.1605.09674},
  year={2016}
}
@article{stark2018preproduce,
  title={Before reproducibility must come preproducibility},
  author={Philip B. Stark},
  journal={Nature 557, 613},
  year={2018}
}
@article{molchanov2017variational,
  title={Variational dropout sparsifies deep neural networks},
  author={Molchanov, Dmitry and Ashukha, Arsenii and Vetrov, Dmitry},
  journal={arXiv preprint arXiv:1701.05369},
  year={2017}
}
@article{hinton2012improving,
  title={Improving neural networks by preventing co-adaptation of feature detectors},
  author={Hinton, Geoffrey E and Srivastava, Nitish and Krizhevsky, Alex and Sutskever, Ilya and Salakhutdinov, Ruslan R},
  journal={arXiv preprint arXiv:1207.0580},
  year={2012}
}
@article{gal2015bayesian,
  title={Bayesian convolutional neural networks with Bernoulli approximate variational inference},
  author={Gal, Yarin and Ghahramani, Zoubin},
  journal={arXiv preprint arXiv:1506.02158},
  year={2015}
}
@inproceedings{glorot2010understanding,
  title={Understanding the difficulty of training deep feedforward neural networks},
  author={Glorot, Xavier and Bengio, Yoshua},
  booktitle={Proceedings of the thirteenth international conference on artificial intelligence and statistics},
  pages={249--256},
  year={2010}
}
@misc{Karparthy,
    author = "{Karparthy, Andrej}",
    title = {{Neural Networks 1}},
    howpublished = {\url{http://cs231n.github.io/neural-networks-1/}},
    note = {Online} ,
    year=2016,
}
@article{lecun-mnisthandwrittendigit-2010,
  added-at = {2010-06-28T21:16:30.000+0200},
  author = {LeCun, Yann and Cortes, Corinna},
  title = {{MNIST} handwritten digit database},
  url = {http://yann.lecun.com/exdb/mnist/},
  year = 2010
}
@article{Torralba:2008:MTI:1444381.1444403,
 author = {Torralba, Antonio and Fergus, Rob and Freeman, William T.},
 title = {80 Million Tiny Images: A Large Data Set for Nonparametric Object and Scene Recognition},
 journal = {IEEE Trans. Pattern Anal. Mach. Intell.},
 issue_date = {November 2008},
 volume = {30},
 number = {11},
 month = nov,
 year = {2008},
} 
@InProceedings{10.1007/978-3-642-40760-4_2,
author="Shi, Wenzhe
and Caballero, Jose
and Ledig, Christian
and Zhuang, Xiahai
and Bai, Wenjia
and Bhatia, Kanwal
and de Marvao, Antonio M. Simoes Monteiro
and Dawes, Tim
and O'Regan, Declan
and Rueckert, Daniel",
editor="Mori, Kensaku
and Sakuma, Ichiro
and Sato, Yoshinobu
and Barillot, Christian
and Navab, Nassir",
title="Cardiac Image Super-Resolution with Global Correspondence Using Multi-Atlas PatchMatch",
booktitle="Medical Image Computing and Computer-Assisted Intervention -- MICCAI 2013",
year="2013",
publisher="Springer Berlin Heidelberg",
}

@ARTICLE{1203152, 
author={B. K. Gunturk and A. U. Batur and Y. Altunbasak and M. H. Hayes and R. M. Mersereau}, 
journal={IEEE Transactions on Image Processing}, 
title={Eigenface-domain super-resolution for face recognition}, 
year={2003}, 
volume={12}, 
number={5}, 
pages={597-606}, 
keywords={face recognition;image resolution;eigenvalues and eigenfunctions;image reconstruction;eigenface-domain super-resolution;face recognition;surveillance cameras;reconstruction;visually improved high-quality image;low dimensional domain;face-space super-resolution;registration errors;noise;Face recognition;Image resolution;Image reconstruction;Surveillance;Computational complexity;Noise robustness;Cameras;Reconstruction algorithms;Image recognition}, 
doi={10.1109/TIP.2003.811513}, 
ISSN={1057-7149}, 
month={May},}
@inproceedings{Yang2014SingleImageSA,
  title={Single-Image Super-Resolution: A Benchmark},
  author={Chih-Yuan Yang and Chao Ma and Ming-Hsuan Yang},
  booktitle={ECCV},
  year={2014}
}
@article{DBLP:journals/corr/ShiCHTABRW16,
  author    = {Wenzhe Shi and
               Jose Caballero and
               Ferenc Husz{\'{a}}r and
               Johannes Totz and
               Andrew P. Aitken and
               Rob Bishop and
               Daniel Rueckert and
               Zehan Wang},
  title     = {Real-Time Single Image and Video Super-Resolution Using an Efficient
               Sub-Pixel Convolutional Neural Network},
  journal   = {CoRR},
  volume    = {abs/1609.05158},
  year      = {2016},
  url       = {http://arxiv.org/abs/1609.05158},
  archivePrefix = {arXiv},
  eprint    = {1609.05158},
  timestamp = {Mon, 13 Aug 2018 16:47:09 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/ShiCHTABRW16},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{goodfellow2014generative,
  title={Generative adversarial nets},
  author={Goodfellow, Ian and Pouget-Abadie, Jean and Mirza, Mehdi and Xu, Bing and Warde-Farley, David and Ozair, Sherjil and Courville, Aaron and Bengio, Yoshua},
  booktitle={Advances in neural information processing systems},
  pages={2672--2680},
  year={2014}
}
@article{DBLP:journals/corr/RadfordMC15,
  author    = {Alec Radford and
               Luke Metz and
               Soumith Chintala},
  title     = {Unsupervised Representation Learning with Deep Convolutional Generative
               Adversarial Networks},
  journal   = {CoRR},
  volume    = {abs/1511.06434},
  year      = {2015},
}
@misc{Gluon,
    author = "{Gluon MXnet}",
    title = {chapter18\_variational-methods-and-uncertainty},
    howpublished = {\url{https://gluon.mxnet.io/chapter18_variational-methods-and-uncertainty/bayes-by-backprop.html}},
    note = {Online} ,
    year=2017,
}
@article{DBLP:journals/corr/KingmaB14,
  author    = {Diederik P. Kingma and
               Jimmy Ba},
  title     = {Adam: {A} Method for Stochastic Optimization},
  journal   = {CoRR},
  volume    = {abs/1412.6980},
  year      = {2014},
}
@InProceedings{pmlr-v15-coates11a,
  title = 	 {An Analysis of Single-Layer Networks in Unsupervised Feature Learning},
  author = 	 {Adam Coates and Andrew Ng and Honglak Lee},
  booktitle = 	 {Proceedings of the Fourteenth International Conference on Artificial Intelligence and Statistics},
  pages = 	 {215--223},
  year = 	 {2011},
  editor = 	 {Geoffrey Gordon and David Dunson and Miroslav Dudík},
  volume = 	 {15},
  series = 	 {Proceedings of Machine Learning Research},
  address = 	 {Fort Lauderdale, FL, USA},
  month = 	 {11--13 Apr},
  publisher = 	 {PMLR},
}
@inproceedings{Gal2015Dropout,
Author = {Yarin Gal and Zoubin Ghahramani},
Title = {Dropout as a {B}ayesian approximation: Insights and Applications},
booktitle={Deep Learning Workshop, ICML},
Year = {2015}
}
@inproceedings{hinton1993keeping,
    Author = {Hinton, G. and Van Camp, D.},
    Booktitle = {Computational Learning Theory},
    Organization = {ACM},
    Pages = {5--13},
    Title = {Keeping the neural networks simple by minimizing the description length of the weights},
    Year = {1993}
}
@article{barber1998ensemble,
  title={Ensemble learning in Bayesian neural networks},
  author={Barber, David and Bishop, Christopher M},
  journal={NATO ASI SERIES F COMPUTER AND SYSTEMS SCIENCES},
  volume={168},
  pages={215--238},
  year={1998},
  publisher={SPRINGER VERLAG}
}
@article{Rumelhart,
author = {E. Rumelhart, David and E. Hinton, Geoffrey and J. Williams, Ronald},
year = {1986},
month = {10},
pages = {533-536},
title = {Learning Representations by Back Propagating Errors},
volume = {323},
journal = {Nature},
doi = {10.1038/323533a0}
}
@incollection{mackay1996hyperparameters,
  title={Hyperparameters: optimize, or integrate out?},
  author={MacKay, David JC},
  booktitle={Maximum entropy and bayesian methods},
  pages={43--59},
  year={1996},
  publisher={Springer}
}
@inproceedings{Mackay1991APB,
  title={A Practical Bayesian Framework for Backprop Networks},
  author={David J C Mackay},
  year={1991}
}
@article{Jylanki:2014:EPN:2627435.2638593,
 author = {Jyl\"{a}nki, Pasi and Nummenmaa, Aapo and Vehtari, Aki},
 title = {Expectation Propagation for Neural Networks with Sparsity-promoting Priors},
 journal = {J. Mach. Learn. Res.},
 issue_date = {January 2014},
 volume = {15},
 number = {1},
 month = jan,
 year = {2014},
 issn = {1532-4435},
 pages = {1849--1901},
 numpages = {53},
 url = {http://dl.acm.org/citation.cfm?id=2627435.2638593},
 acmid = {2638593},
 publisher = {JMLR.org},
} 
@inproceedings{Soudry:NIPS2014_5269,
title = {Expectation Backpropagation: Parameter-Free Training of Multilayer Neural Networks with Continuous or Discrete Weights},
author = {Soudry, Daniel and Hubara, Itay and Meir, Ron},
booktitle = {Advances in Neural Information Processing Systems 27},
editor = {Z. Ghahramani and M. Welling and C. Cortes and N. D. Lawrence and K. Q. Weinberger},
pages = {963--971},
year = {2014},
publisher = {Curran Associates, Inc.},
url = {http://papers.nips.cc/paper/5269-expectation-backpropagation-parameter-free-training-of-multilayer-neural-networks-with-continuous-or-discrete-weights.pdf},
}
@article{DBLP:journals/corr/HanMD15,
  author    = {Song Han and
               Huizi Mao and
               William J. Dally},
  title     = {Deep Compression: Compressing Deep Neural Network with Pruning, Trained
               Quantization and Huffman Coding},
  journal   = {CoRR},
  volume    = {abs/1510.00149},
  year      = {2015},
  url       = {http://arxiv.org/abs/1510.00149},
  archivePrefix = {arXiv},
  eprint    = {1510.00149},
  timestamp = {Mon, 13 Aug 2018 16:48:14 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/HanMD15},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/NarangDSE17,
  author    = {Sharan Narang and
               Gregory F. Diamos and
               Shubho Sengupta and
               Erich Elsen},
  title     = {Exploring Sparsity in Recurrent Neural Networks},
  journal   = {CoRR},
  volume    = {abs/1704.05119},
  year      = {2017},
  url       = {http://arxiv.org/abs/1704.05119},
  archivePrefix = {arXiv},
  eprint    = {1704.05119},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/NarangDSE17},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{lecun1990optimal,
  title={Optimal brain damage},
  author={LeCun, Yann and Denker, John S and Solla, Sara A},
  booktitle={Advances in neural information processing systems},
  pages={598--605},
  year={1990}
}
@article{DBLP:journals/corr/AnwarHS15,
  author    = {Sajid Anwar and
               Kyuyeon Hwang and
               Wonyong Sung},
  title     = {Structured Pruning of Deep Convolutional Neural Networks},
  journal   = {CoRR},
  volume    = {abs/1512.08571},
  year      = {2015},
  url       = {http://arxiv.org/abs/1512.08571},
  archivePrefix = {arXiv},
  eprint    = {1512.08571},
  timestamp = {Mon, 13 Aug 2018 16:46:45 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/AnwarHS15},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LebedevGROL14,
  author    = {Vadim Lebedev and
               Yaroslav Ganin and
               Maksim Rakhuba and
               Ivan V. Oseledets and
               Victor S. Lempitsky},
  title     = {Speeding-up Convolutional Neural Networks Using Fine-tuned CP-Decomposition},
  journal   = {CoRR},
  volume    = {abs/1412.6553},
  year      = {2014}
}
@article{DBLP:journals/corr/ChangpinyoSZ17,
  author    = {Soravit Changpinyo and
               Mark Sandler and
               Andrey Zhmoginov},
  title     = {The Power of Sparsity in Convolutional Neural Networks},
  journal   = {CoRR},
  volume    = {abs/1702.06257},
  year      = {2017}
}
@article{DBLP:journals/corr/GongLYB14,
  author    = {Yunchao Gong and
               Liu Liu and
               Ming Yang and
               Lubomir D. Bourdev},
  title     = {Compressing Deep Convolutional Networks using Vector Quantization},
  journal   = {CoRR},
  volume    = {abs/1412.6115},
  year      = {2014}
}
@inproceedings{denton2014exploiting,
  title={Exploiting linear structure within convolutional networks for efficient evaluation},
  author={Denton, Emily L and Zaremba, Wojciech and Bruna, Joan and LeCun, Yann and Fergus, Rob},
  booktitle={Advances in neural information processing systems},
  pages={1269--1277},
  year={2014}
}
@inproceedings{DBLP:conf/nips/AlvarezS16,
  author    = {Jose M. Alvarez and
               Mathieu Salzmann},
  title     = {Learning the Number of Neurons in Deep Networks},
  booktitle = {{NIPS}},
  pages     = {2262--2270},
  year      = {2016}
}
@article{Kiureghian,
author = {Der Kiureghian, Armen and Ditlevsen, Ove},
year = {2009},
month = {03},
pages = {105-112},
title = {Aleatory or Epistemic? Does It Matter?},
volume = {31},
journal = {Structural Safety},
doi = {10.1016/j.strusafe.2008.06.020}
}
@article{lafferty2001conditional,
  title={Conditional random fields: Probabilistic models for segmenting and labeling sequence data},
  author={Lafferty, John and McCallum, Andrew and Pereira, Fernando CN},
  year={2001}
}
@InProceedings{MartinFTM01,
  author = {D. Martin and C. Fowlkes and D. Tal and J. Malik},
  title = {A Database of Human Segmented Natural Images and its
           Application to Evaluating Segmentation Algorithms and
           Measuring Ecological Statistics},
  booktitle = {Proc. 8th Int'l Conf. Computer Vision},
  year = {2001},
  month = {July},
  volume = {2},
  pages = {416--423}
}
@article{DBLP:journals/corr/RadfordMC15,
  author    = {Alec Radford and
               Luke Metz and
               Soumith Chintala},
  title     = {Unsupervised Representation Learning with Deep Convolutional Generative
               Adversarial Networks},
  journal   = {CoRR},
  volume    = {abs/1511.06434},
  year      = {2015}
}
@article{shridhar2018bayesian,
  title={Bayesian Convolutional Neural Networks with Variational Inference},
  author={Shridhar, Kumar and Laumann, Felix and Llopart Maurin, Adrian and Olsen, Martin and Liwicki, Marcus},
  journal={arXiv preprint arXiv:1806.05978},
  year={2018}
}
@article{hafner2018reliable,
  title={Reliable uncertainty estimates in deep neural networks using noise contrastive priors},
  author={Hafner, Danijar and Tran, Dustin and Irpan, Alex and Lillicrap, Timothy and Davidson, James},
  journal={arXiv preprint arXiv:1807.09289},
  year={2018}
}
@article{tibshirani1996regression,
  title={Regression shrinkage and selection via the lasso},
  author={Tibshirani, Robert},
  journal={Journal of the Royal Statistical Society. Series B (Methodological)},
  pages={267--288},
  year={1996},
  publisher={JSTOR}
}
    